import pandas  as pd

"""
wangosng 2021-10-16
dataloader 
"""

MD_PATH = 'data/Molecular_Descriptor.xlsx'
ER_PATH = 'data/ERα_activity.xlsx'
AD_PATH = 'data/ADMET.xlsx'


def getdata():
    # 分子描述符
    md_train = pd.read_excel(MD_PATH, sheet_name='training')  # 1974,730
    md_test = pd.read_excel(MD_PATH, sheet_name='test')  # 50,730

    # 生物活性
    er_train = pd.read_excel(ER_PATH, sheet_name='training')  # 1974,3
    er_test = pd.read_excel(ER_PATH, sheet_name='test')  # 50,3

    # 药物动力学
    ad_train = pd.read_excel(AD_PATH, sheet_name='training')  # 1974,6
    ad_test = pd.read_excel(AD_PATH, sheet_name='test')  # 50,6

    molecular_train = ad_train['SMILES'].tolist()
    molecular_test = ad_test['SMILES'].tolist()

    return md_train, md_test, er_train, er_test, ad_train, ad_test,molecular_train,molecular_test
